DATASET_1="/data2/indexed_dataset/230530/coig-part_text_document"
DATASET_2="/data2/indexed_dataset/230530/oig-part_text_document"
DATASET_3="/data2/indexed_dataset/230530/jiaocai-clean_text_document"
DATASET_4="/data2/indexed_dataset/230530/paper_full_processed_text_document"
DATASET_5="/data2/indexed_dataset/230530/wg_batch2_zhihu_text_document"
DATASET_6="/data2/indexed_dataset/230530/newspaper_text_document"
DATASET_7="/data2/indexed_dataset/230530/csdn_text_document"
DATASET_8="/data2/indexed_dataset/230530/wg_toutiao_content300_up100_text_document"
DATASET_9="/data2/indexed_dataset/230530/en_dedup-md5-pile-wikipedia_en_text_document"
DATASET_10="/data2/indexed_dataset/230530/cn_baike_text_document"
DATASET_11="/data2/indexed_dataset/230530/pile-books_text_document"
DATASET_12="/data2/indexed_dataset/230530/pile-papers_text_document"
DATASET_13="/data2/indexed_dataset/230530/paper_abstract_processed_text_document"
DATASET_14="/data2/indexed_dataset/230530/github-issues-filtered-structured_text_document"
DATASET_15="/data2/indexed_dataset/20230605/red-arxiv_text_document"
DATASET_16="/data2/indexed_dataset/20230605/red-stack_text_document"
DATASET_17="/data2/indexed_dataset/20230605/medqa_cn_text_document"
DATASET_18="/data2/indexed_dataset/20230605/medqa_en_text_document"

DATASET="0.000162639 ${DATASET_1} 0.004426368 ${DATASET_2} 0.000166534 ${DATASET_3} \
	 0.016352866 ${DATASET_4} 0.102543643 ${DATASET_5} 0.01687438 ${DATASET_6} \
	 0.044070303 ${DATASET_7} 0.002955416 ${DATASET_8} 0.023779319 ${DATASET_9} \
	 0.119052866 ${DATASET_10} 0.173453699 ${DATASET_11} 0.122679437 ${DATASET_12} \
	 0.000592826 ${DATASET_13} 0.102404734 ${DATASET_14} 0.157529966 ${DATASET_15} \
	 0.112656526 ${DATASET_16} 0.000232112 ${DATASET_17} 0.000881214 ${DATASET_18}"
DATASET_KNOWLEDGE3=$DATASET
echo "DATASET_KNOWLEDGE3: " $DATASET_KNOWLEDGE3

DATASET_1="/data2/indexed_dataset/230530/clue_mmlu_text_document"
DATASET_2="/data2/indexed_dataset/230530/coig-part_text_document"
DATASET_3="/data2/indexed_dataset/230530/oig-part_text_document"
DATASET_4="/data2/indexed_dataset/230530/jiaocai-clean_text_document"
DATASET_5="/data2/indexed_dataset/230530/paper_full_processed_text_document"
DATASET_6="/data2/indexed_dataset/230530/wg_batch2_zhihu_text_document"
DATASET_7="/data2/indexed_dataset/230530/newspaper_text_document"
DATASET_8="/data2/indexed_dataset/230530/csdn_text_document"
DATASET_9="/data2/indexed_dataset/230530/wg_toutiao_content300_up100_text_document"
DATASET_10="/data2/indexed_dataset/230530/en_dedup-md5-pile-wikipedia_en_text_document"
DATASET_11="/data2/indexed_dataset/230530/cn_baike_text_document"
DATASET_12="/data2/indexed_dataset/230530/pile-books_text_document"
DATASET_13="/data2/indexed_dataset/230530/pile-papers_text_document"
DATASET_14="/data2/indexed_dataset/230530/paper_abstract_processed_text_document"
DATASET_15="/data2/indexed_dataset/230513/github-issues-filtered-structured_text_document"
DATASET_16="/data2/indexed_dataset/20230605/red-arxiv_text_document"
DATASET_17="/data2/indexed_dataset/20230605/red-stack_text_document"
DATASET_18="/data2/indexed_dataset/20230605/medqa_cn_text_document"
DATASET_19="/data2/indexed_dataset/20230605/medqa_en_text_document"
DATASET_20="/data2/indexed_dataset/20230614/norm-competition-math_text_document"
DATASET_21="/data2/indexed_dataset/20230614/norm-prm800k_text_document"
DATASET_22="/data2/indexed_dataset/20230614/norm-schoolmath_text_document"
DATASET_23="/data2/indexed_dataset/20230614/norm-tiger-zh_text_document"
DATASET_24="/data2/indexed_dataset/20230614/norm-math_text_document"
DATASET_25="/data2/indexed_dataset/20230614/norm-mathamps-khan_text_document"
DATASET_26="/data2/indexed_dataset/20230614/norm-mathamps-mathematica_text_document"
DATASET_27="/data2/indexed_dataset/20230614/falcon_batch1_text_document"
DATASET_28="/data2/indexed_dataset/20230614/wudao_norm_2_text_document"
DATASET_29="/data2/indexed_dataset/230513/c_text_document"
DATASET_30="/data2/indexed_dataset/230513/cpp_text_document"
DATASET_31="/data2/indexed_dataset/230513/git-commits-cleaned_text_document"
DATASET_32="/data2/indexed_dataset/230513/go_text_document"
DATASET_33="/data2/indexed_dataset/230513/java_text_document"
DATASET_34="/data2/indexed_dataset/230513/javascript_text_document"
DATASET_35="/data2/indexed_dataset/230513/jupyter-structured-clean-dedup_text_document"
DATASET_36="/data2/indexed_dataset/230513/jupyter-scripts-dedup-filtered_text_document"
DATASET_37="/data2/indexed_dataset/230513/python_text_document"
DATASET_38="/data2/indexed_dataset/230513/shell_text_document"
DATASET_39="/data2/indexed_dataset/230513/sql_text_document"
DATASET="0.000030942 ${DATASET_1} 0.000075828 ${DATASET_2} 0.002063713 ${DATASET_3} 0.000077643 ${DATASET_4} 0.007624226 ${DATASET_5} 0.047809106 ${DATASET_6} 0.007867372 ${DATASET_7} 0.020546976 ${DATASET_8} 0.001377909 ${DATASET_9} 0.011086674 ${DATASET_10} 0.055506230 ${DATASET_11} 0.080869628 ${DATASET_12} 0.057197053 ${DATASET_13} 0.000276394 ${DATASET_14} 0.007161651 ${DATASET_15} 0.073445477 ${DATASET_16} 0.052524053 ${DATASET_17} 0.000108218 ${DATASET_18} 0.000410850 ${DATASET_19} 0.000027724 ${DATASET_20} 0.000037326 ${DATASET_21} 0.000230670 ${DATASET_22} 0.032149520 ${DATASET_23} 0.000027724 ${DATASET_24} 0.000213058 ${DATASET_25} 0.006247222 ${DATASET_26} 0.316465086 ${DATASET_27} 0.123905866 ${DATASET_28} 0.013879362 ${DATASET_29} 0.011439817 ${DATASET_30} 0.006585650 ${DATASET_31} 0.006066391 ${DATASET_32} 0.016885567 ${DATASET_33} 0.013406281 ${DATASET_34} 0.002467256 ${DATASET_35} 0.002081261 ${DATASET_36} 0.017816446 ${DATASET_37} 0.000793237 ${DATASET_38} 0.003214590 ${DATASET_39}"
DATASET_KNOWLEDGE4=$DATASET
echo "DATASET_KNOWLEDGE4: " $DATASET_KNOWLEDGE4

DATASET_1="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/en_dedup-md5-pile-openwebtext2_text_document"
DATASET_2="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/en_dedup-md5-pile-pile-cc_text_document"
DATASET_3="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/wudao-9_text_document"
DATASET_4="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/code_dedup-md5-pile-github_text_document"
DATASET_5="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/codegeex_text_document"
DATASET_6="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/en_dedup-md5-pile-wikipedia_en_text_document"
DATASET_7="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/cn_baike_text_document"
DATASET_8="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/pile-books_text_document"
DATASET_9="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/cn_ebook_merge_maxlen_text_document"
DATASET_10="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/pile-papers_text_document"
DATASET_11="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/en_dedup-md5-pile-stackexchange_text_document"
DATASET_12="/data2/indexed_dataset/batch1_batch2_tok100k/batch1_tok100k/cn_zhihu_text_document"
DATASET_13="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/ccnews_text_document"
DATASET_14="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/c4_text_document"
DATASET_15="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/wudao-3-8_text_document"
DATASET_16="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/hf-wiki_text_document"
DATASET_17="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/sjt_text_document"
DATASET_18="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/col_text_document"
DATASET_19="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/byg-cn_text_document"
DATASET_20="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/qa_text_document"
DATASET_21="/data2/indexed_dataset/batch1_batch2_tok100k/batch2_tok100k/wenge-zhihu-high_text_document"
DATASET="2.242990654 ${DATASET_1} 5.046728972 ${DATASET_2} 13.644859810 ${DATASET_3} 2.336448598 ${DATASET_4} 1.869158879 ${DATASET_5} 1.588785047 ${DATASET_6} 2.336448598 ${DATASET_7} 4.205607477 ${DATASET_8} 0.186915888 ${DATASET_9} 2.429906542 ${DATASET_10} 1.869158879 ${DATASET_11} 0.747663551 ${DATASET_12} 31.775700930 ${DATASET_13} 12.429906540 ${DATASET_14} 11.588785050 ${DATASET_15} 1.869158879 ${DATASET_16} 0.654205607 ${DATASET_17} 1.214953271 ${DATASET_18} 1.121495327 ${DATASET_19} 0.093457944 ${DATASET_20} 0.747663551 ${DATASET_21}"
DATASET_V3=$DATASET
echo "DATASET_V3: " $DATASET_V3

DATASET_1="/data2/indexed_dataset/230530/clue_mmlu_text_document"
DATASET_2="/data2/indexed_dataset/230530/coig-part_text_document"
DATASET_3="/data2/indexed_dataset/230530/oig-part_text_document"
DATASET_4="/data2/indexed_dataset/230530/jiaocai-clean_text_document"
DATASET_5="/data2/indexed_dataset/230530/paper_full_processed_text_document"
DATASET_6="/data2/indexed_dataset/230530/wg_batch2_zhihu_text_document"
DATASET_7="/data2/indexed_dataset/230530/newspaper_text_document"
DATASET_8="/data2/indexed_dataset/230530/csdn_text_document"
DATASET_9="/data2/indexed_dataset/230530/wg_toutiao_content300_up100_text_document"
DATASET_10="/data2/indexed_dataset/230530/en_dedup-md5-pile-wikipedia_en_text_document"
DATASET_11="/data2/indexed_dataset/230530/cn_baike_text_document"
DATASET_12="/data2/indexed_dataset/230530/pile-books_text_document"
DATASET_13="/data2/indexed_dataset/230530/pile-papers_text_document"
DATASET_14="/data2/indexed_dataset/230530/paper_abstract_processed_text_document"
DATASET_15="/data2/indexed_dataset/230513/github-issues-filtered-structured_text_document"
DATASET_16="/data2/indexed_dataset/20230605/red-arxiv_text_document"
DATASET_17="/data2/indexed_dataset/20230605/red-stack_text_document"
DATASET_18="/data2/indexed_dataset/20230605/medqa_cn_text_document"
DATASET_19="/data2/indexed_dataset/20230605/medqa_en_text_document"
DATASET_20="/data2/indexed_dataset/20230614/norm-competition-math_text_document"
DATASET_21="/data2/indexed_dataset/20230614/norm-prm800k_text_document"
DATASET_22="/data2/indexed_dataset/20230614/norm-schoolmath_text_document"
DATASET_23="/data2/indexed_dataset/20230614/norm-tiger-zh_text_document"
DATASET_24="/data2/indexed_dataset/20230614/norm-math_text_document"
DATASET_25="/data2/indexed_dataset/20230614/norm-mathamps-khan_text_document"
DATASET_26="/data2/indexed_dataset/20230614/norm-mathamps-mathematica_text_document"
DATASET_27="/data/20230702/falcon_batch2_text_document"
DATASET_28="/data/20230702/wudao_norm_1_text_document"
DATASET_29="/data2/indexed_dataset/230513/c_text_document"
DATASET_30="/data2/indexed_dataset/230513/cpp_text_document"
DATASET_31="/data2/indexed_dataset/230513/git-commits-cleaned_text_document"
DATASET_32="/data2/indexed_dataset/230513/go_text_document"
DATASET_33="/data2/indexed_dataset/230513/java_text_document"
DATASET_34="/data2/indexed_dataset/230513/javascript_text_document"
DATASET_35="/data2/indexed_dataset/230513/jupyter-structured-clean-dedup_text_document"
DATASET_36="/data2/indexed_dataset/230513/jupyter-scripts-dedup-filtered_text_document"
DATASET_37="/data2/indexed_dataset/230513/python_text_document"
DATASET_38="/data2/indexed_dataset/230513/shell_text_document"
DATASET_39="/data2/indexed_dataset/230513/sql_text_document"
DATASET_40="/data/20230704/ccmatrix-zh-en_text_document"
DATASET_41="/data/20230704/tsl2019_text_document"
DATASET_42="/data/20230704/csl_text_document"
DATASET_43="/data/20230702/kg-zy_text_document"
DATASET_44="/data/20230704/mnbvc-gov_text_document"
DATASET_45="/data/20230704/mnbvc-qa_text_document"
DATASET_46="/data/20230704/mnbvc-qaen_text_document"
DATASET_47="/data/20230704/mnbvc-wiki_text_document"
DATASET_48="/data/20230704/norm-baikeqa_text_document"
DATASET_49="/data/20230704/mnbvc-xxqg_text_document"
DATASET_50="/data/20230704/mnbvc-news_text_document"
DATASET_51="/data/20230704/mnbvc-co-ann-report_text_document"
DATASET="0.000029445 ${DATASET_1} 0.000072158 ${DATASET_2} 0.001963836 ${DATASET_3} 0.000073886 ${DATASET_4} 0.007255237 ${DATASET_5} 0.045495293 ${DATASET_6} 0.007486616 ${DATASET_7} 0.039105132 ${DATASET_8} 0.001311223 ${DATASET_9} 0.010550114 ${DATASET_10} 0.052819900 ${DATASET_11} 0.076955788 ${DATASET_12} 0.054428893 ${DATASET_13} 0.000263018 ${DATASET_14} 0.006815050 ${DATASET_15} 0.069890943 ${DATASET_16} 0.049982051 ${DATASET_17} 0.000102980 ${DATASET_18} 0.000390966 ${DATASET_19} 0.000008794 ${DATASET_20} 0.000011840 ${DATASET_21} 0.000073169 ${DATASET_22} 0.030593583 ${DATASET_23} 0.000026382 ${DATASET_24} 0.000202747 ${DATASET_25} 0.001981625 ${DATASET_26} 0.301181480 ${DATASET_27} 0.150872077 ${DATASET_28} 0.013207644 ${DATASET_29} 0.010886165 ${DATASET_30} 0.006266925 ${DATASET_31} 0.005772797 ${DATASET_32} 0.016068358 ${DATASET_33} 0.012757458 ${DATASET_34} 0.001980534 ${DATASET_35} 0.002347849 ${DATASET_36} 0.016954185 ${DATASET_37} 0.000754847 ${DATASET_38} 0.003059014 ${DATASET_39} 0.000059718 ${DATASET_40} 0.000705214 ${DATASET_41} 0.001058247 ${DATASET_42} 0.001156925 ${DATASET_43} 0.000016870 ${DATASET_44} 0.001156909 ${DATASET_45} 0.000315041 ${DATASET_46} 0.011401359 ${DATASET_47} 0.000877942 ${DATASET_48} 0.000397255 ${DATASET_49} 0.001670916 ${DATASET_50} 0.008678739 ${DATASET_51}"
DATASET_KNOWLEDGE5=$DATASET
echo "DATASET_KNOWLEDGE5: " $DATASET_KNOWLEDGE5

DATASET_1="/data/binary_data/cn_baike_text_document"
DATASET_2="/data/binary_data/cn_book_paper_text_document"
DATASET_3="/data/binary_data/code_v02_train_text_document"
DATASET_4="/data/binary_data/en_dedup-md5-pile-stackexchange_text_document"
DATASET_5="/data/binary_data/en_dedup-md5-pile-wikipedia_en_text_document"
DATASET_6="/data/binary_data/falcon_batch05_text_document"
DATASET_7="/data/binary_data/kbqa_text_document"
DATASET_8="/data/binary_data/mnbvc_text_document"
DATASET_9="/data/binary_data/newspaper_text_document"
DATASET_10="/data/binary_data/red-arxiv_text_document"
DATASET_11="/data/binary_data/wg_batch2_zhihu_text_document"
DATASET_12="/data/binary_data/wg_toutiao_content300_up100_text_document"
DATASET_13="/data/binary_data/wudao-9_text_document"
DATASET_14="/data/binary_data/red-book_text_document"
DATASET="0.050000000 ${DATASET_1} 0.075000000 ${DATASET_2} 0.100000000 ${DATASET_3} 0.050000000 ${DATASET_4} 0.050000000 ${DATASET_5} 0.300000000 ${DATASET_6} 0.015000000 ${DATASET_7} 0.047500000 ${DATASET_8} 0.015000000 ${DATASET_9} 0.100000000 ${DATASET_10} 0.010000000 ${DATASET_11} 0.002500000 ${DATASET_12} 0.085000000 ${DATASET_13} 0.100000000 ${DATASET_14}"
DATASET_KNOWLEDGE6=$DATASET
echo "DATASET_KNOWLEDGE6: " $DATASET_KNOWLEDGE6

DATASET_1="/share/binary_data/cn_baike_text_document"
DATASET_2="/share/binary_data/cn_book_paper_text_document"
DATASET_3="/share/binary_data/code_v02_train_text_document"
DATASET_4="/share/binary_data/en_dedup-md5-pile-stackexchange_text_document"
DATASET_5="/share/binary_data/en_dedup-md5-pile-wikipedia_en_text_document"
DATASET_6="/share/binary_data/falcon_batch05_text_document"
DATASET_7="/share/binary_data/kbqa_text_document"
DATASET_8="/share/binary_data/mnbvc_text_document"
DATASET_9="/share/binary_data/newspaper_text_document"
DATASET_10="/share/binary_data/red-arxiv_text_document"
DATASET_11="/share/binary_data/wg_batch2_zhihu_text_document"
DATASET_12="/share/binary_data/wg_toutiao_content300_up100_text_document"
DATASET_13="/share/binary_data/wudao-9_text_document"
DATASET_14="/share/binary_data/red-book_text_document"
DATASET="0.050000000 ${DATASET_1} 0.075000000 ${DATASET_2} 0.100000000 ${DATASET_3} 0.050000000 ${DATASET_4} 0.050000000 ${DATASET_5} 0.300000000 ${DATASET_6} 0.015000000 ${DATASET_7} 0.047500000 ${DATASET_8} 0.015000000 ${DATASET_9} 0.100000000 ${DATASET_10} 0.010000000 ${DATASET_11} 0.002500000 ${DATASET_12} 0.085000000 ${DATASET_13} 0.100000000 ${DATASET_14}"
DATASET_DX_KNOWLEDGE6=$DATASET
echo "DATASET_DX_KNOWLEDGE6: " $DATASET_DX_KNOWLEDGE6

DATASET_1="/share/project/batch7_tok100k/cn_baike_text_document"
DATASET_2="/share/project/batch7_tok100k/cn_book_paper_text_document"
DATASET_3="/share/project/batch7_tok100k/code_v02_train_text_document"
DATASET_4="/share/project/batch7_tok100k/en_dedup-md5-pile-stackexchange_text_document"
DATASET_5="/share/project/batch7_tok100k/en_dedup-md5-pile-wikipedia_en_text_document"
DATASET_6="/share/project/batch7_tok100k/falcon_batch05_text_document"
DATASET_7="/share/project/batch7_tok100k/kbqa_text_document"
DATASET_8="/share/project/batch7_tok100k/mnbvc_text_document"
DATASET_9="/share/project/batch7_tok100k/newspaper_text_document"
DATASET_10="/share/project/batch7_tok100k/red-arxiv_text_document"
DATASET_11="/share/project/batch7_tok100k/wg_batch2_zhihu_text_document"
DATASET_12="/share/project/batch7_tok100k/wg_toutiao_content300_up100_text_document"
DATASET_13="/share/project/batch7_tok100k/wudao-9_text_document"
DATASET_14="/share/project/batch7_tok100k/red-book_text_document"
DATASET="0.050000000 ${DATASET_1} 0.075000000 ${DATASET_2} 0.100000000 ${DATASET_3} 0.050000000 ${DATASET_4} 0.050000000 ${DATASET_5} 0.300000000 ${DATASET_6} 0.015000000 ${DATASET_7} 0.047500000 ${DATASET_8} 0.015000000 ${DATASET_9} 0.100000000 ${DATASET_10} 0.010000000 ${DATASET_11} 0.002500000 ${DATASET_12} 0.085000000 ${DATASET_13} 0.100000000 ${DATASET_14}"
DATASET_JD_KNOWLEDGE6=$DATASET
echo "DATASET_JD_KNOWLEDGE6: " $DATASET_JD_KNOWLEDGE6

DATASET_1="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/en_dedup-md5-pile-openwebtext2_text_document"
DATASET_2="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/en_dedup-md5-pile-pile-cc_text_document"
DATASET_3="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/wudao-9_text_document"
DATASET_4="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/code_dedup-md5-pile-github_text_document"
DATASET_5="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/codegeex_text_document"
DATASET_6="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/en_dedup-md5-pile-wikipedia_en_text_document"
DATASET_7="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/cn_baike_text_document"
DATASET_8="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/pile-books_text_document"
DATASET_9="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/cn_ebook_merge_maxlen_text_document"
DATASET_10="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/pile-papers_text_document"
DATASET_11="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/en_dedup-md5-pile-stackexchange_text_document"
DATASET_12="/share/projset/LM_data/batch1_batch2_tok100k/batch1_tok100k/cn_zhihu_text_document"
DATASET_13="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/ccnews_text_document"
DATASET_14="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/c4_text_document"
DATASET_15="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/wudao-3-8_text_document"
DATASET_16="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/hf-wiki_text_document"
DATASET_17="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/sjt_text_document"
DATASET_18="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/col_text_document"
DATASET_19="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/byg-cn_text_document"
DATASET_20="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/qa_text_document"
DATASET_21="/share/projset/LM_data/batch1_batch2_tok100k/batch2_tok100k/wenge-zhihu-high_text_document"
DATASET="2.242990654 ${DATASET_1} 5.046728972 ${DATASET_2} 13.644859810 ${DATASET_3} 2.336448598 ${DATASET_4} 1.869158879 ${DATASET_5} 1.588785047 ${DATASET_6} 2.336448598 ${DATASET_7} 4.205607477 ${DATASET_8} 0.186915888 ${DATASET_9} 2.429906542 ${DATASET_10} 1.869158879 ${DATASET_11} 0.747663551 ${DATASET_12} 31.775700930 ${DATASET_13} 12.429906540 ${DATASET_14} 11.588785050 ${DATASET_15} 1.869158879 ${DATASET_16} 0.654205607 ${DATASET_17} 1.214953271 ${DATASET_18} 1.121495327 ${DATASET_19} 0.093457944 ${DATASET_20} 0.747663551 ${DATASET_21}"
DATASET_JD_V3=$DATASET
echo "DATASET_JD_V3: " $DATASET_JD_V3
